@article{silver2016mastering,
  title={Mastering the game of Go with deep neural networks and tree search},
  author={Silver, David and Huang, Aja and Maddison, Chris J and Guez, Arthur and Sifre, Laurent and Van Den Driessche, George and Schrittwieser, Julian and Antonoglou, Ioannis and Panneershelvam, Veda and Lanctot, Marc and others},
  journal={nature},
  volume={529},
  number={7587},
  pages={484--489},
  year={2016},
  publisher={Nature Publishing Group}
}




@inproceedings{fayjie2018driverless,
  title={Driverless car: Autonomous driving using deep reinforcement learning in urban environment},
  author={Fayjie, Abdur R and Hossain, Sabir and Oualid, Doukhi and Lee, Deok-Jin},
  booktitle={2018 15th international conference on ubiquitous robots (ur)},
  pages={896--901},
  year={2018},
  organization={IEEE}
}


@article{prasad2017reinforcement,
  title={A reinforcement learning approach to weaning of mechanical ventilation in intensive care units},
  author={Prasad, Niranjani and Cheng, Li-Fang and Chivers, Corey and Draugelis, Michael and Engelhardt, Barbara E},
  journal={arXiv preprint arXiv:1704.06300},
  year={2017}
}

@article{deng2016deep,
  title={Deep direct reinforcement learning for financial signal representation and trading},
  author={Deng, Yue and Bao, Feng and Kong, Youyong and Ren, Zhiquan and Dai, Qionghai},
  journal={IEEE transactions on neural networks and learning systems},
  volume={28},
  number={3},
  pages={653--664},
  year={2016},
  publisher={IEEE}
}


@article{amarjyoti2017deep,
  title={Deep reinforcement learning for robotic manipulation-the state of the art},
  author={Amarjyoti, Smruti},
  journal={arXiv preprint arXiv:1701.08878},
  year={2017}
}


@article{nguyen2021deep,
  title={Deep reinforcement learning for cyber security},
  author={Nguyen, Thanh Thi and Reddi, Vijay Janapa},
  journal={IEEE Transactions on Neural Networks and Learning Systems},
  year={2021},
  publisher={IEEE}
}



@article{oh2015action,
  title={Action-conditional video prediction using deep networks in atari games},
  author={Oh, Junhyuk and Guo, Xiaoxiao and Lee, Honglak and Lewis, Richard L and Singh, Satinder},
  journal={Advances in neural information processing systems},
  volume={28},
  year={2015}
}


@article{mnih2013playing,
  title={Playing atari with deep reinforcement learning},
  author={Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Graves, Alex and Antonoglou, Ioannis and Wierstra, Daan and Riedmiller, Martin},
  journal={arXiv preprint arXiv:1312.5602},
  year={2013}
}




@inproceedings{schulman2015trust,
  title={Trust region policy optimization},
  author={Schulman, John and Levine, Sergey and Abbeel, Pieter and Jordan, Michael and Moritz, Philipp},
  booktitle={International conference on machine learning},
  pages={1889--1897},
  year={2015},
  organization={PMLR}
}



@article{wu2017scalable,
  title={Scalable trust-region method for deep reinforcement learning using kronecker-factored approximation},
  author={Wu, Yuhuai and Mansimov, Elman and Grosse, Roger B and Liao, Shun and Ba, Jimmy},
  journal={Advances in neural information processing systems},
  volume={30},
  year={2017}
}


@article{huang2017adversarial,
  title={Adversarial attacks on neural network policies},
  author={Huang, Sandy and Papernot, Nicolas and Goodfellow, Ian and Duan, Yan and Abbeel, Pieter},
  journal={arXiv preprint arXiv:1702.02284},
  year={2017}
}


@article{chen2018gradient,
  title={Gradient band-based adversarial training for generalized attack immunity of A3C path finding},
  author={Chen, Tong and Niu, Wenjia and Xiang, Yingxiao and Bai, Xiaoxuan and Liu, Jiqiang and Han, Zhen and Li, Gang},
  journal={arXiv preprint arXiv:1807.06752},
  year={2018}
}


@inproceedings{ferdowsi2018robust,
  title={Robust deep reinforcement learning for security and safety in autonomous vehicle systems},
  author={Ferdowsi, Aidin and Challita, Ursula and Saad, Walid and Mandayam, Narayan B},
  booktitle={2018 21st International Conference on Intelligent Transportation Systems (ITSC)},
  pages={307--312},
  year={2018},
  organization={IEEE}
}


@book{sutton2018reinforcement,
  title={Reinforcement learning: An introduction},
  author={Sutton, Richard S and Barto, Andrew G},
  year={2018},
  publisher={MIT press}
}


@article{goodfellow2014explaining,
  title={Explaining and harnessing adversarial examples},
  author={Goodfellow, Ian J and Shlens, Jonathon and Szegedy, Christian},
  journal={arXiv preprint arXiv:1412.6572},
  year={2014}
}



@article{lin2017tactics,
  title={Tactics of adversarial attack on deep reinforcement learning agents},
  author={Lin, Yen-Chen and Hong, Zhang-Wei and Liao, Yuan-Hong and Shih, Meng-Li and Liu, Ming-Yu and Sun, Min},
  journal={arXiv preprint arXiv:1703.06748},
  year={2017}
}


@article{kos2017delving,
  title={Delving into adversarial attacks on deep policies},
  author={Kos, Jernej and Song, Dawn},
  journal={arXiv preprint arXiv:1705.06452},
  year={2017}
}


@article{kiourti2019trojan,
  title={Trojan attacks on deep reinforcement learning agents},
  author={Kiourti, P and Wardega, K and Jha, S and Li, W C TrojDRL},
  journal={arXiv preprint arXiv:1903.06638},
  year={2019}
}


@inproceedings{lee2020spatiotemporally,
  title={Spatiotemporally constrained action space attacks on deep reinforcement learning agents},
  author={Lee, Xian Yeow and Ghadai, Sambit and Tan, Kai Liang and Hegde, Chinmay and Sarkar, Soumik},
  booktitle={Proceedings of the AAAI Conference on Artificial Intelligence},
  volume={34},
  number={04},
  pages={4577--4584},
  year={2020}
}


@inproceedings{bai2018adversarial,
  title={Adversarial examples construction towards white-box Q table variation in DQN pathfinding training},
  author={Bai, Xiaoxuan and Niu, Wenjia and Liu, Jiqiang and Gao, Xu and Xiang, Yingxiao and Liu, Jingjing},
  booktitle={2018 IEEE Third International Conference on Data Science in Cyberspace (DSC)},
  pages={781--787},
  year={2018},
  organization={IEEE}
}



@article{gleave2019adversarial,
  title={Adversarial policies: Attacking deep reinforcement learning},
  author={Gleave, Adam and Dennis, Michael and Wild, Cody and Kant, Neel and Levine, Sergey and Russell, Stuart},
  journal={arXiv preprint arXiv:1905.10615},
  year={2019}
}


@inproceedings{pinto2017robust,
  title={Robust adversarial reinforcement learning},
  author={Pinto, Lerrel and Davidson, James and Sukthankar, Rahul and Gupta, Abhinav},
  booktitle={International Conference on Machine Learning},
  pages={2817--2826},
  year={2017},
  organization={PMLR}
}